
#验证模型
from unsloth import FastLanguageModel
model, tokenizer = FastLanguageModel.from_pretrained("ckpt/r1-sft1", load_in_4bit=True)
inputs = tokenizer("问题：7+3*7=？\n\n请一步步思考并给出答案。", return_tensors="pt").to("cuda")
print(tokenizer.decode(model.generate(**inputs, max_new_tokens=256)[0]))
